package u1;

import static java.lang.System.*;

import java.io.IOException;
import java.io.InputStream;
import java.io.PrintWriter;
import java.io.StringWriter;

import org.xml.sax.SAXException;

/**
 * Takes uncompressed enwiki XML dump on stdin and produces some statistics on
 * stdout.
 */
public class Stats {
  public static void main(String[] argv) throws SAXException, IOException {
    out.println(new Stats(in));
  }

  private int pageCount = 0;
  private long totalLength = 0;

  public Stats(InputStream is) throws SAXException, IOException {
    PageReader pages = new PageReader() {
      @Override
      public void readPage(String title, String text) {
        pageCount += 1;
        totalLength += text.length();
      }
    };
    pages.parse(is);
  }

  public int getPageCount() {
    return pageCount;
  }

  public long getTotalTextLength() {
    return totalLength;
  }

  public double getMeanTextLength() {
    if (pageCount == 0)
      return 0;
    return totalLength / pageCount;
  }

  @Override
  public String toString() {
    StringWriter sw = new StringWriter();
    PrintWriter p = new PrintWriter(sw);
    p.println("pages:\t\t\t" + getPageCount());
    p.println("mean text length (ch):\t" + getMeanTextLength());
    p.println("total text length (ch):\t" + getTotalTextLength());
    return sw.toString();
  }
}
/*
* Copyright (c) 2009 John Lees-Miller
* 
* Permission is hereby granted, free of charge, to any person
* obtaining a copy of this software and associated documentation
* files (the "Software"), to deal in the Software without
* restriction, including without limitation the rights to use,
* copy, modify, merge, publish, distribute, sublicense, and/or sell
* copies of the Software, and to permit persons to whom the
* Software is furnished to do so, subject to the following
* conditions:
* 
* The above copyright notice and this permission notice shall be
* included in all copies or substantial portions of the Software.
* 
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
* OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
* NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
* HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
* WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
* OTHER DEALINGS IN THE SOFTWARE.
*/

